import requests
from bs4 import BeautifulSoup

url = "https://arxiv.org/abs/2401.00005"

# 伪装User-Agent
headers = {
    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:91.0) Gecko/20100101 Firefox/91.0"
}

# 发送请求获取页面内容
response = requests.get(url, headers=headers)

# 检查请求是否成功
if response.status_code == 200:
    # 解析网页内容
    soup = BeautifulSoup(response.content, 'html.parser')


    page_text = soup.get_text(separator='\n', strip=True)


    print(page_text)
else:
    print(f"无法访问页面，状态码: {response.status_code}")
